{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "登录cookie __gc_id=2ac265247f1b46ae9a912074658f173b; _ga=GA1.1.597765461.1682506422; __uuid=1682506422329.96; need_bind_tel=false; new_user=false; c_flag=5713a43b31ace1782d727f43d70e7d39; imClientId_0=361750144e9de4dcd301c4fb9208a238; imId_0=361750144e9de4dc12239eefcc348bee; imId=361750144e9de4dc12239eefcc348bee; imClientId=361750144e9de4dcd301c4fb9208a238; access_system=C; XSRF-TOKEN=ghxMXXt-RoWWcr83QqFVtQ; acw_tc=276077d217014126244393078e346addf530c74b9e08a5fb42d90bf46d8aa1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1700050490,1701256310,1701363567,1701412625; __tlog=1701412624468.76%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; UniqueKey=c302a80880ac965b6bc56763ae71c6f2; liepin_login_valid=0; lt_auth=vr4DPyRQmwr97HmI3zALtfkb3YqgBDjP9SwNh08C0dHqU6Lk4P%2FmQA%2BHq7UC%2BCoIqx0hf68zMLf%2BNOz%2Fy3VP60QS8FGnlZ6utf6k1X0eTudsHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=b5ee7120f5575e1aeee9a223f157bcaf; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E6%B1%9F%E5%A5%B3%E5%A3%AB; hpo_role-sec_project=sec_project_liepin; hpo_sec_tenant=0; imApp_0=1; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701412666; __session_seq=5; __uv_seq=9; __tlg_event_seq=8; _ga_54YTJKWN86=GS1.1.1701412665.45.1.1701412669.0.0.0; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_c302a80880ac965b6bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D\n",
      "这是第1页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第2页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第3页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第4页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第5页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第6页，接下来将先等待5秒...然后以继续抓取\n",
      "这是第7页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第8页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第9页，接下来将先等待5秒...然后以继续抓取\n",
      "这是第10页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第11页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第12页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第13页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第14页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第15页，接下来将先等待4秒...然后以继续抓取\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.jobKind</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>job.link</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>job.title</th>\n",
       "      <th>job.jobId</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>...</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>job.requireEduLevel</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>comp.compStage</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>%7B%22scene%22%3A%22condition%22%2C%22skId%22%...</td>\n",
       "      <td>{\"jobKind\":\"6\",\"recruiterName\":\"邝女士\",\"userId\":...</td>\n",
       "      <td>[3个月, 本科, 文案策划]</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/lptjob/55349311</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>广告文案实习生</td>\n",
       "      <td>55349311</td>\n",
       "      <td>20230829114648</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f986779c7cc70efbf36c008u.jpg</td>\n",
       "      <td>619f0f281bd4fb704e7abbd902u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13336431/</td>\n",
       "      <td>上海奥美广告有限公司深圳分公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>13336431.0</td>\n",
       "      <td>咨询服务</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>%7B%22scene%22%3A%22condition%22%2C%22skId%22%...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"recruiterName\":\"朱女士\",\"userId\":...</td>\n",
       "      <td>[广告文案]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1928150619.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>广告文案</td>\n",
       "      <td>28150619</td>\n",
       "      <td>20200603231359</td>\n",
       "      <td>...</td>\n",
       "      <td>5eba8edd4ff090104e4a102307u.png</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/12236489/</td>\n",
       "      <td>华御祥茶科学研究院(深圳)有限公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>12236489.0</td>\n",
       "      <td>培训服务</td>\n",
       "      <td>本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>%7B%22scene%22%3A%22condition%22%2C%22skId%22%...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"recruiterName\":\"徐先生\",\"userId\":...</td>\n",
       "      <td>[新媒体策划, 会议策划, 企业策划, 招商策划, 广告策划, 品牌策划, 营销策划, 活动...</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1950599367.shtml</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>广告文案策划</td>\n",
       "      <td>50599367</td>\n",
       "      <td>20220629074539</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f98698dbe6273dcf8516008u.jpg</td>\n",
       "      <td>5f4b6b70f6d1ab584743aa4504u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/12374979/</td>\n",
       "      <td>深圳新叶影视传媒有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>12374979.0</td>\n",
       "      <td>广播/影视/录音</td>\n",
       "      <td>本科</td>\n",
       "      <td>一年以下</td>\n",
       "      <td>融资未公开</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>%7B%22scene%22%3A%22condition%22%2C%22skId%22%...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"recruiterName\":\"徐女士\",\"userId\":...</td>\n",
       "      <td>[公众号, 文案策划]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1953446233.shtml</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>广告文案策划</td>\n",
       "      <td>53446233</td>\n",
       "      <td>20221028142027</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/9511270/</td>\n",
       "      <td>广东知恒律师事务所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>9511270.0</td>\n",
       "      <td>法律服务</td>\n",
       "      <td>本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>%7B%22scene%22%3A%22condition%22%2C%22skId%22%...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"recruiterName\":\"潘女士\",\"userId\":...</td>\n",
       "      <td>[广告文案, 新媒体文案]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1938952859.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>广告文案策划</td>\n",
       "      <td>38952859</td>\n",
       "      <td>20210510093306</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/12732883/</td>\n",
       "      <td>深圳笑响传媒有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>12732883.0</td>\n",
       "      <td>专业技术服务</td>\n",
       "      <td>本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"userId\":\"0dc65e3d9e20a45fd5405...</td>\n",
       "      <td>[广告投放, 文案]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1938840273.shtml</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>FB 海外推广负责人</td>\n",
       "      <td>38840273</td>\n",
       "      <td>20210506142937</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>601395e57d90cc70b4d23f0e03u.png</td>\n",
       "      <td>https://www.liepin.com/company/12481123/</td>\n",
       "      <td>深圳为华网络科技有限公司</td>\n",
       "      <td>1000-2000人</td>\n",
       "      <td>12481123.0</td>\n",
       "      <td>互联网</td>\n",
       "      <td>本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"userId\":\"961079ca3c014fec97fe4...</td>\n",
       "      <td>[市场推广, 市场策划, 市场调研分析, 活动策划, 广告策划, 市场营销, 广告媒介, 营...</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1923016703.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>市场营销专员</td>\n",
       "      <td>23016703</td>\n",
       "      <td>20221107184837</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>5bfea12574719d2aa34c1a0f03a.png</td>\n",
       "      <td>https://www.liepin.com/company/9378436/</td>\n",
       "      <td>深圳市华盛昌科技实业股份有限公司</td>\n",
       "      <td>1000-2000人</td>\n",
       "      <td>9378436.0</td>\n",
       "      <td>仪器仪表</td>\n",
       "      <td>本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>沪深A股上市</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"userId\":\"df21d8a0f87dced3a687a...</td>\n",
       "      <td>[策划]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1929978881.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>市场策划主任</td>\n",
       "      <td>29978881</td>\n",
       "      <td>20200922172336</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f986779c7cc70efbf36c008u.jpg</td>\n",
       "      <td>5c106d66570cb120f1860ee202u.png</td>\n",
       "      <td>https://www.liepin.com/company/9126093/</td>\n",
       "      <td>广州市时代胜誉投资有限公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>9126093.0</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"userId\":\"2eff24c01ce82ae8096c4...</td>\n",
       "      <td>[品牌策划, 品牌设计, 品牌推广, 广告媒体, 广告媒介, 企业品牌, 自媒体, 广告/传...</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1952945195.shtml</td>\n",
       "      <td>深圳-罗湖区</td>\n",
       "      <td>品牌策划主管</td>\n",
       "      <td>52945195</td>\n",
       "      <td>20221006100807</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f98648dbe6273dcf8515508u.jpg</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/12800845/</td>\n",
       "      <td>深圳市东方嘉裕实业有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>12800845.0</td>\n",
       "      <td>珠宝/首饰</td>\n",
       "      <td>本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"userId\":\"e5f8a8d1990818486d7bb...</td>\n",
       "      <td>[ae, 视频广告, 广告创意, am, ad]</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>https://www.liepin.com/job/1940139851.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>广告创意</td>\n",
       "      <td>40139851</td>\n",
       "      <td>20230915100742</td>\n",
       "      <td>...</td>\n",
       "      <td>6371af31afeb7c1758403d3401u.png</td>\n",
       "      <td>5bfe9f9474719d2aa34bcc4903a.png</td>\n",
       "      <td>https://www.liepin.com/company/8574135/</td>\n",
       "      <td>深圳市点维文化传播有限公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>8574135.0</td>\n",
       "      <td>广告/公关/会展</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>582 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             dataInfo  \\\n",
       "0   %7B%22scene%22%3A%22condition%22%2C%22skId%22%...   \n",
       "1   %7B%22scene%22%3A%22condition%22%2C%22skId%22%...   \n",
       "2   %7B%22scene%22%3A%22condition%22%2C%22skId%22%...   \n",
       "3   %7B%22scene%22%3A%22condition%22%2C%22skId%22%...   \n",
       "4   %7B%22scene%22%3A%22condition%22%2C%22skId%22%...   \n",
       "..                                                ...   \n",
       "17  %7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...   \n",
       "18  %7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...   \n",
       "19  %7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...   \n",
       "20  %7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...   \n",
       "21  %7B%22jobKind%22%3A%222%22%2C%22pageSize%22%3A...   \n",
       "\n",
       "                                           dataParams  \\\n",
       "0   {\"jobKind\":\"6\",\"recruiterName\":\"邝女士\",\"userId\":...   \n",
       "1   {\"jobKind\":\"2\",\"recruiterName\":\"朱女士\",\"userId\":...   \n",
       "2   {\"jobKind\":\"2\",\"recruiterName\":\"徐先生\",\"userId\":...   \n",
       "3   {\"jobKind\":\"2\",\"recruiterName\":\"徐女士\",\"userId\":...   \n",
       "4   {\"jobKind\":\"2\",\"recruiterName\":\"潘女士\",\"userId\":...   \n",
       "..                                                ...   \n",
       "17  {\"jobKind\":\"2\",\"userId\":\"0dc65e3d9e20a45fd5405...   \n",
       "18  {\"jobKind\":\"2\",\"userId\":\"961079ca3c014fec97fe4...   \n",
       "19  {\"jobKind\":\"2\",\"userId\":\"df21d8a0f87dced3a687a...   \n",
       "20  {\"jobKind\":\"2\",\"userId\":\"2eff24c01ce82ae8096c4...   \n",
       "21  {\"jobKind\":\"2\",\"userId\":\"e5f8a8d1990818486d7bb...   \n",
       "\n",
       "                                           job.labels job.jobKind  job.topJob  \\\n",
       "0                                     [3个月, 本科, 文案策划]           6       False   \n",
       "1                                              [广告文案]           2       False   \n",
       "2   [新媒体策划, 会议策划, 企业策划, 招商策划, 广告策划, 品牌策划, 营销策划, 活动...           2       False   \n",
       "3                                         [公众号, 文案策划]           2       False   \n",
       "4                                       [广告文案, 新媒体文案]           2       False   \n",
       "..                                                ...         ...         ...   \n",
       "17                                         [广告投放, 文案]           2       False   \n",
       "18  [市场推广, 市场策划, 市场调研分析, 活动策划, 广告策划, 市场营销, 广告媒介, 营...           2       False   \n",
       "19                                               [策划]           2       False   \n",
       "20  [品牌策划, 品牌设计, 品牌推广, 广告媒体, 广告媒介, 企业品牌, 自媒体, 广告/传...           2       False   \n",
       "21                           [ae, 视频广告, 广告创意, am, ad]           2       False   \n",
       "\n",
       "                                       job.link  job.dq   job.title job.jobId  \\\n",
       "0        https://www.liepin.com/lptjob/55349311  深圳-福田区     广告文案实习生  55349311   \n",
       "1   https://www.liepin.com/job/1928150619.shtml      深圳        广告文案  28150619   \n",
       "2   https://www.liepin.com/job/1950599367.shtml  深圳-南山区      广告文案策划  50599367   \n",
       "3   https://www.liepin.com/job/1953446233.shtml  深圳-福田区      广告文案策划  53446233   \n",
       "4   https://www.liepin.com/job/1938952859.shtml      深圳      广告文案策划  38952859   \n",
       "..                                          ...     ...         ...       ...   \n",
       "17  https://www.liepin.com/job/1938840273.shtml  深圳-南山区  FB 海外推广负责人  38840273   \n",
       "18  https://www.liepin.com/job/1923016703.shtml      深圳      市场营销专员  23016703   \n",
       "19  https://www.liepin.com/job/1929978881.shtml      深圳      市场策划主任  29978881   \n",
       "20  https://www.liepin.com/job/1952945195.shtml  深圳-罗湖区      品牌策划主管  52945195   \n",
       "21  https://www.liepin.com/job/1940139851.shtml      深圳        广告创意  40139851   \n",
       "\n",
       "   job.refreshTime  ...         recruiter.recruiterPhoto  \\\n",
       "0   20230829114648  ...  5f8f986779c7cc70efbf36c008u.jpg   \n",
       "1   20200603231359  ...  5eba8edd4ff090104e4a102307u.png   \n",
       "2   20220629074539  ...  5f8f98698dbe6273dcf8516008u.jpg   \n",
       "3   20221028142027  ...  5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "4   20210510093306  ...  5f8f9865ea60860b75384fa508u.jpg   \n",
       "..             ...  ...                              ...   \n",
       "17  20210506142937  ...  5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "18  20221107184837  ...  5f8f9865ea60860b75384fa508u.jpg   \n",
       "19  20200922172336  ...  5f8f986779c7cc70efbf36c008u.jpg   \n",
       "20  20221006100807  ...  5f8f98648dbe6273dcf8515508u.jpg   \n",
       "21  20230915100742  ...  6371af31afeb7c1758403d3401u.png   \n",
       "\n",
       "                      comp.compLogo                                 comp.link  \\\n",
       "0   619f0f281bd4fb704e7abbd902u.jpg  https://www.liepin.com/company/13336431/   \n",
       "1   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/12236489/   \n",
       "2   5f4b6b70f6d1ab584743aa4504u.jpg  https://www.liepin.com/company/12374979/   \n",
       "3   61b07937d0458d53c627567e02u.jpg   https://www.liepin.com/company/9511270/   \n",
       "4   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/12732883/   \n",
       "..                              ...                                       ...   \n",
       "17  601395e57d90cc70b4d23f0e03u.png  https://www.liepin.com/company/12481123/   \n",
       "18  5bfea12574719d2aa34c1a0f03a.png   https://www.liepin.com/company/9378436/   \n",
       "19  5c106d66570cb120f1860ee202u.png   https://www.liepin.com/company/9126093/   \n",
       "20  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/12800845/   \n",
       "21  5bfe9f9474719d2aa34bcc4903a.png   https://www.liepin.com/company/8574135/   \n",
       "\n",
       "        comp.compName comp.compScale comp.compId comp.compIndustry  \\\n",
       "0     上海奥美广告有限公司深圳分公司          1-49人  13336431.0              咨询服务   \n",
       "1   华御祥茶科学研究院(深圳)有限公司         50-99人  12236489.0              培训服务   \n",
       "2        深圳新叶影视传媒有限公司       100-499人  12374979.0          广播/影视/录音   \n",
       "3           广东知恒律师事务所          1-49人   9511270.0              法律服务   \n",
       "4          深圳笑响传媒有限公司          1-49人  12732883.0            专业技术服务   \n",
       "..                ...            ...         ...               ...   \n",
       "17       深圳为华网络科技有限公司     1000-2000人  12481123.0               互联网   \n",
       "18   深圳市华盛昌科技实业股份有限公司     1000-2000人   9378436.0              仪器仪表   \n",
       "19      广州市时代胜誉投资有限公司       10000人以上   9126093.0           房地产开发经营   \n",
       "20      深圳市东方嘉裕实业有限公司          1-49人  12800845.0             珠宝/首饰   \n",
       "21      深圳市点维文化传播有限公司         50-99人   8574135.0          广告/公关/会展   \n",
       "\n",
       "   job.requireEduLevel job.requireWorkYears comp.compStage  \n",
       "0                  NaN                  NaN            NaN  \n",
       "1                   本科                 经验不限            NaN  \n",
       "2                   本科                 一年以下          融资未公开  \n",
       "3                   本科                 经验不限            NaN  \n",
       "4                   本科                 经验不限            NaN  \n",
       "..                 ...                  ...            ...  \n",
       "17                  本科                5-10年            NaN  \n",
       "18                  本科                 3-5年         沪深A股上市  \n",
       "19                统招本科                 3-5年            NaN  \n",
       "20                  本科                 3-5年            NaN  \n",
       "21                统招本科                 3-5年            NaN  \n",
       "\n",
       "[582 rows x 32 columns]"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import crawl_liepin\n",
    "\n",
    "crawl_liepin.crawl(城市=\"深圳\",关键词=\"广告文案\",学历='本科',工作经验='')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 1. cookies实现登陆，获取完整数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'__gc_id=2ac265247f1b46ae9a912074658f173b; _ga=GA1.1.597765461.1682506422; __uuid=1682506422329.96; need_bind_tel=false; new_user=false; c_flag=5713a43b31ace1782d727f43d70e7d39; imClientId_0=361750144e9de4dcd301c4fb9208a238; imId_0=361750144e9de4dc12239eefcc348bee; imId=361750144e9de4dc12239eefcc348bee; imClientId=361750144e9de4dcd301c4fb9208a238; access_system=C; XSRF-TOKEN=ghxMXXt-RoWWcr83QqFVtQ; acw_tc=276077d217014126244393078e346addf530c74b9e08a5fb42d90bf46d8aa1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1700050490,1701256310,1701363567,1701412625; __tlog=1701412624468.76%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; UniqueKey=c302a80880ac965b6bc56763ae71c6f2; liepin_login_valid=0; lt_auth=vr4DPyRQmwr97HmI3zALtfkb3YqgBDjP9SwNh08C0dHqU6Lk4P%2FmQA%2BHq7UC%2BCoIqx0hf68zMLf%2BNOz%2Fy3VP60QS8FGnlZ6utf6k1X0eTudsHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=b5ee7120f5575e1aeee9a223f157bcaf; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E6%B1%9F%E5%A5%B3%E5%A3%AB; hpo_role-sec_project=sec_project_liepin; hpo_sec_tenant=0; imApp_0=1; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701412666; __session_seq=5; __uv_seq=9; __tlg_event_seq=8; _ga_54YTJKWN86=GS1.1.1701412665.45.1.1701412669.0.0.0; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_c302a80880ac965b6bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D'"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 建立登陆cookie\n",
    "cookie = \"__gc_id=2ac265247f1b46ae9a912074658f173b; _ga=GA1.1.597765461.1682506422; __uuid=1682506422329.96; need_bind_tel=false; new_user=false; c_flag=5713a43b31ace1782d727f43d70e7d39; imClientId_0=361750144e9de4dcd301c4fb9208a238; imId_0=361750144e9de4dc12239eefcc348bee; imId=361750144e9de4dc12239eefcc348bee; imClientId=361750144e9de4dcd301c4fb9208a238; access_system=C; XSRF-TOKEN=ghxMXXt-RoWWcr83QqFVtQ; acw_tc=276077d217014126244393078e346addf530c74b9e08a5fb42d90bf46d8aa1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1700050490,1701256310,1701363567,1701412625; __tlog=1701412624468.76%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; UniqueKey=c302a80880ac965b6bc56763ae71c6f2; liepin_login_valid=0; lt_auth=vr4DPyRQmwr97HmI3zALtfkb3YqgBDjP9SwNh08C0dHqU6Lk4P%2FmQA%2BHq7UC%2BCoIqx0hf68zMLf%2BNOz%2Fy3VP60QS8FGnlZ6utf6k1X0eTudsHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=b5ee7120f5575e1aeee9a223f157bcaf; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E6%B1%9F%E5%A5%B3%E5%A3%AB; hpo_role-sec_project=sec_project_liepin; hpo_sec_tenant=0; imApp_0=1; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701412666; __session_seq=5; __uv_seq=9; __tlg_event_seq=8; _ga_54YTJKWN86=GS1.1.1701412665.45.1.1701412669.0.0.0; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_c302a80880ac965b6bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D\"\n",
    "cookie"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "登录cookie __gc_id=2ac265247f1b46ae9a912074658f173b; _ga=GA1.1.597765461.1682506422; __uuid=1682506422329.96; need_bind_tel=false; new_user=false; c_flag=5713a43b31ace1782d727f43d70e7d39; imClientId_0=361750144e9de4dcd301c4fb9208a238; imId_0=361750144e9de4dc12239eefcc348bee; imId=361750144e9de4dc12239eefcc348bee; imClientId=361750144e9de4dcd301c4fb9208a238; access_system=C; XSRF-TOKEN=ghxMXXt-RoWWcr83QqFVtQ; acw_tc=276077d217014126244393078e346addf530c74b9e08a5fb42d90bf46d8aa1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1700050490,1701256310,1701363567,1701412625; __tlog=1701412624468.76%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; UniqueKey=c302a80880ac965b6bc56763ae71c6f2; liepin_login_valid=0; lt_auth=vr4DPyRQmwr97HmI3zALtfkb3YqgBDjP9SwNh08C0dHqU6Lk4P%2FmQA%2BHq7UC%2BCoIqx0hf68zMLf%2BNOz%2Fy3VP60QS8FGnlZ6utf6k1X0eTudsHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=b5ee7120f5575e1aeee9a223f157bcaf; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E6%B1%9F%E5%A5%B3%E5%A3%AB; hpo_role-sec_project=sec_project_liepin; hpo_sec_tenant=0; imApp_0=1; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701412666; __session_seq=5; __uv_seq=9; __tlg_event_seq=8; _ga_54YTJKWN86=GS1.1.1701412665.45.1.1701412669.0.0.0; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_c302a80880ac965b6bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D\n",
      "这是第1页，接下来将先等待8秒...然后以继续抓取\n",
      "这是第2页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第3页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第4页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第5页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第6页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第7页，接下来将先等待5秒...然后以继续抓取\n",
      "这是第8页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第9页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第10页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第11页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第12页，接下来将先等待5秒...然后以继续抓取\n",
      "这是第13页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第14页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第15页，接下来将先等待7秒...然后以继续抓取\n"
     ]
    }
   ],
   "source": [
    "import crawl_liepin\n",
    "\n",
    "广告文案_深圳_results = crawl_liepin.crawl(城市=\"深圳\",关键词=\"广告文案\",学历='本科',工作经验='',登录cookie=cookie)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 2. 使用数据分析进行数据交互式可视化"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<bound method DataFrame.to_html of                                              dataInfo  \\\n",
       "0   %7B%22jobId%22%3A%2255349311%22%2C%22pageSize%...   \n",
       "1   %7B%22jobId%22%3A%2228150619%22%2C%22pageSize%...   \n",
       "2   %7B%22jobId%22%3A%2250599367%22%2C%22pageSize%...   \n",
       "3   %7B%22jobId%22%3A%2253446233%22%2C%22pageSize%...   \n",
       "4   %7B%22jobId%22%3A%2238952859%22%2C%22pageSize%...   \n",
       "..                                                ...   \n",
       "17  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22ckId...   \n",
       "18  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22ckId...   \n",
       "19  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22ckId...   \n",
       "20  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22ckId...   \n",
       "21  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22ckId...   \n",
       "\n",
       "                                           dataParams  \\\n",
       "0   {\"jobId\":\"55349311\",\"imId\":\"079c6af93eb22be9aa...   \n",
       "1   {\"jobId\":\"28150619\",\"imId\":\"f8b39aaa0ec65e4029...   \n",
       "2   {\"jobId\":\"50599367\",\"imId\":\"53f9830b05847f35c1...   \n",
       "3   {\"jobId\":\"53446233\",\"imId\":\"6967079578f3b3ab84...   \n",
       "4   {\"jobId\":\"38952859\",\"imId\":\"1ab376ef323ad88540...   \n",
       "..                                                ...   \n",
       "17  {\"recruiterPhoto\":\"5f8f9866dfb13a7dee342f1808u...   \n",
       "18  {\"recruiterPhoto\":\"5f8f9865ea60860b75384fa508u...   \n",
       "19  {\"recruiterPhoto\":\"5f8f986779c7cc70efbf36c008u...   \n",
       "20  {\"recruiterPhoto\":\"5f8f98648dbe6273dcf8515508u...   \n",
       "21  {\"recruiterPhoto\":\"6371af31afeb7c1758403d3401u...   \n",
       "\n",
       "                                           job.labels  \\\n",
       "0                                     [3个月, 本科, 文案策划]   \n",
       "1                                              [广告文案]   \n",
       "2   [新媒体策划, 会议策划, 企业策划, 招商策划, 广告策划, 品牌策划, 营销策划, 活动...   \n",
       "3                                         [公众号, 文案策划]   \n",
       "4                                       [广告文案, 新媒体文案]   \n",
       "..                                                ...   \n",
       "17                                         [广告投放, 文案]   \n",
       "18  [市场推广, 市场策划, 市场调研分析, 活动策划, 广告策划, 市场营销, 广告媒介, 营...   \n",
       "19                                               [策划]   \n",
       "20  [品牌策划, 品牌设计, 品牌推广, 广告媒体, 广告媒介, 企业品牌, 自媒体, 广告/传...   \n",
       "21                           [ae, 视频广告, 广告创意, am, ad]   \n",
       "\n",
       "                                       job.link job.jobId  job.dq  job.topJob  \\\n",
       "0        https://www.liepin.com/lptjob/55349311  55349311  深圳-福田区       False   \n",
       "1   https://www.liepin.com/job/1928150619.shtml  28150619      深圳       False   \n",
       "2   https://www.liepin.com/job/1950599367.shtml  50599367  深圳-南山区       False   \n",
       "3   https://www.liepin.com/job/1953446233.shtml  53446233  深圳-福田区       False   \n",
       "4   https://www.liepin.com/job/1938952859.shtml  38952859      深圳       False   \n",
       "..                                          ...       ...     ...         ...   \n",
       "17  https://www.liepin.com/job/1938840273.shtml  38840273  深圳-南山区       False   \n",
       "18  https://www.liepin.com/job/1923016703.shtml  23016703      深圳       False   \n",
       "19  https://www.liepin.com/job/1929978881.shtml  29978881      深圳       False   \n",
       "20  https://www.liepin.com/job/1952945195.shtml  52945195  深圳-罗湖区       False   \n",
       "21  https://www.liepin.com/job/1940139851.shtml  40139851      深圳       False   \n",
       "\n",
       "   job.refreshTime job.jobKind   job.title  ...  \\\n",
       "0   20230829114648           6     广告文案实习生  ...   \n",
       "1   20200603231359           2        广告文案  ...   \n",
       "2   20220629074539           2      广告文案策划  ...   \n",
       "3   20221028142027           2      广告文案策划  ...   \n",
       "4   20210510093306           2      广告文案策划  ...   \n",
       "..             ...         ...         ...  ...   \n",
       "17  20210506142937           2  FB 海外推广负责人  ...   \n",
       "18  20221107184837           2      市场营销专员  ...   \n",
       "19  20200922172336           2      市场策划主任  ...   \n",
       "20  20221006100807           2      品牌策划主管  ...   \n",
       "21  20230915100742           2        广告创意  ...   \n",
       "\n",
       "           recruiter.recruiterPhoto                                 comp.link  \\\n",
       "0   5f8f986779c7cc70efbf36c008u.jpg  https://www.liepin.com/company/13336431/   \n",
       "1   5eba8edd4ff090104e4a102307u.png  https://www.liepin.com/company/12236489/   \n",
       "2   5f8f98698dbe6273dcf8516008u.jpg  https://www.liepin.com/company/12374979/   \n",
       "3   5f8f9866dfb13a7dee342f1808u.jpg   https://www.liepin.com/company/9511270/   \n",
       "4   5f8f9865ea60860b75384fa508u.jpg  https://www.liepin.com/company/12732883/   \n",
       "..                              ...                                       ...   \n",
       "17  5f8f9866dfb13a7dee342f1808u.jpg  https://www.liepin.com/company/12481123/   \n",
       "18  5f8f9865ea60860b75384fa508u.jpg   https://www.liepin.com/company/9378436/   \n",
       "19  5f8f986779c7cc70efbf36c008u.jpg   https://www.liepin.com/company/9126093/   \n",
       "20  5f8f98648dbe6273dcf8515508u.jpg  https://www.liepin.com/company/12800845/   \n",
       "21  6371af31afeb7c1758403d3401u.png   https://www.liepin.com/company/8574135/   \n",
       "\n",
       "   comp.compId comp.compScale                    comp.compLogo  \\\n",
       "0   13336431.0          1-49人  619f0f281bd4fb704e7abbd902u.jpg   \n",
       "1   12236489.0         50-99人  61b07937d0458d53c627567e02u.jpg   \n",
       "2   12374979.0       100-499人  5f4b6b70f6d1ab584743aa4504u.jpg   \n",
       "3    9511270.0          1-49人  61b07937d0458d53c627567e02u.jpg   \n",
       "4   12732883.0          1-49人  61b07937d0458d53c627567e02u.jpg   \n",
       "..         ...            ...                              ...   \n",
       "17  12481123.0     1000-2000人  601395e57d90cc70b4d23f0e03u.png   \n",
       "18   9378436.0     1000-2000人  5bfea12574719d2aa34c1a0f03a.png   \n",
       "19   9126093.0       10000人以上  5c106d66570cb120f1860ee202u.png   \n",
       "20  12800845.0          1-49人  61b07937d0458d53c627567e02u.jpg   \n",
       "21   8574135.0         50-99人  5bfe9f9474719d2aa34bcc4903a.png   \n",
       "\n",
       "   comp.compIndustry      comp.compName job.requireWorkYears  \\\n",
       "0               咨询服务    上海奥美广告有限公司深圳分公司                  NaN   \n",
       "1               培训服务  华御祥茶科学研究院(深圳)有限公司                 经验不限   \n",
       "2           广播/影视/录音       深圳新叶影视传媒有限公司                 一年以下   \n",
       "3               法律服务          广东知恒律师事务所                 经验不限   \n",
       "4             专业技术服务         深圳笑响传媒有限公司                 经验不限   \n",
       "..               ...                ...                  ...   \n",
       "17               互联网       深圳为华网络科技有限公司                5-10年   \n",
       "18              仪器仪表   深圳市华盛昌科技实业股份有限公司                 3-5年   \n",
       "19           房地产开发经营      广州市时代胜誉投资有限公司                 3-5年   \n",
       "20             珠宝/首饰      深圳市东方嘉裕实业有限公司                 3-5年   \n",
       "21          广告/公关/会展      深圳市点维文化传播有限公司                 3-5年   \n",
       "\n",
       "    job.requireEduLevel comp.compStage  \n",
       "0                   NaN            NaN  \n",
       "1                    本科            NaN  \n",
       "2                    本科          融资未公开  \n",
       "3                    本科            NaN  \n",
       "4                    本科            NaN  \n",
       "..                  ...            ...  \n",
       "17                   本科            NaN  \n",
       "18                   本科         沪深A股上市  \n",
       "19                 统招本科            NaN  \n",
       "20                   本科            NaN  \n",
       "21                 统招本科            NaN  \n",
       "\n",
       "[582 rows x 32 columns]>"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "广告文案_深圳_results.to_html"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['dataInfo', 'dataParams', 'job.labels', 'job.link', 'job.jobId',\n",
       "       'job.dq', 'job.topJob', 'job.refreshTime', 'job.jobKind', 'job.title',\n",
       "       'job.advViewFlag', 'job.pcOuterLink', 'job.h5OuterLink', 'job.salary',\n",
       "       'job.campusJobKind', 'job.dataPromId', 'recruiter.imId',\n",
       "       'recruiter.imUserType', 'recruiter.chatted', 'recruiter.recruiterName',\n",
       "       'recruiter.recruiterTitle', 'recruiter.recruiterId',\n",
       "       'recruiter.recruiterPhoto', 'comp.link', 'comp.compId',\n",
       "       'comp.compScale', 'comp.compLogo', 'comp.compIndustry', 'comp.compName',\n",
       "       'job.requireWorkYears', 'job.requireEduLevel', 'comp.compStage'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "广告文案_深圳_results.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "深圳-南山区    169\n",
       "深圳        154\n",
       "深圳-宝安区     61\n",
       "深圳-龙岗区     58\n",
       "深圳-龙华区     52\n",
       "深圳-福田区     50\n",
       "深圳-罗湖区     32\n",
       "深圳-光明区      2\n",
       "深圳-坪山区      2\n",
       "深圳-盐田区      2\n",
       "Name: job.dq, dtype: int64"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "series_dq = 广告文案_深圳_results['job.dq'].value_counts()\n",
    "series_dq"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['深圳-南山区',\n",
       " '深圳-宝安区',\n",
       " '深圳-龙岗区',\n",
       " '深圳-龙华区',\n",
       " '深圳-福田区',\n",
       " '深圳-罗湖区',\n",
       " '深圳-光明区',\n",
       " '深圳-坪山区',\n",
       " '深圳-盐田区']"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dq_name= [i for i in series_dq.index if '-' in i]\n",
    "dq_name"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([169,  61,  58,  52,  50,  32,   2,   2,   2], dtype=int64)"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "series_dq[dq_name].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Requirement already satisfied: pyecharts in d:\\python\\lib\\site-packages (2.0.3)\n",
      "Requirement already satisfied: jinja2 in d:\\python\\lib\\site-packages (from pyecharts) (3.1.2)\n",
      "Requirement already satisfied: prettytable in d:\\python\\lib\\site-packages (from pyecharts) (3.7.0)\n",
      "Requirement already satisfied: simplejson in d:\\python\\lib\\site-packages (from pyecharts) (3.19.1)\n",
      "Requirement already satisfied: MarkupSafe>=2.0 in d:\\python\\lib\\site-packages (from jinja2->pyecharts) (2.1.2)\n",
      "Requirement already satisfied: wcwidth in d:\\python\\lib\\site-packages (from prettytable->pyecharts) (0.2.6)\n"
     ]
    }
   ],
   "source": [
    "!pip install pyecharts"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "from pyecharts import options as opts\n",
    "from pyecharts.charts import Map\n",
    "from pyecharts.faker import Faker\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['南山区', '宝安区', '龙岗区', '龙华区', '福田区', '罗湖区', '光明区', '坪山区', '盐田区']"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[i.split('-')[1] for i in dq_name]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[169, 61, 58, 52, 50, 32, 2, 2, 2]"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "series_dq[dq_name].values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "<script>\n",
       "    require.config({\n",
       "        paths: {\n",
       "            'echarts':'https://assets.pyecharts.org/assets/v5/echarts.min', '深圳':'https://assets.pyecharts.org/assets/v5/maps/guang3_dong1_shen1_zhen4'\n",
       "        }\n",
       "    });\n",
       "</script>\n",
       "\n",
       "        <div id=\"98d9ea2cc0614ebbaa308c36e445c838\" style=\"width:900px; height:500px;\"></div>\n",
       "\n",
       "<script>\n",
       "        require(['echarts', '深圳'], function(echarts) {\n",
       "                var chart_98d9ea2cc0614ebbaa308c36e445c838 = echarts.init(\n",
       "                    document.getElementById('98d9ea2cc0614ebbaa308c36e445c838'), 'white', {renderer: 'canvas'});\n",
       "                var option_98d9ea2cc0614ebbaa308c36e445c838 = {\n",
       "    \"animation\": true,\n",
       "    \"animationThreshold\": 2000,\n",
       "    \"animationDuration\": 1000,\n",
       "    \"animationEasing\": \"cubicOut\",\n",
       "    \"animationDelay\": 0,\n",
       "    \"animationDurationUpdate\": 300,\n",
       "    \"animationEasingUpdate\": \"cubicOut\",\n",
       "    \"animationDelayUpdate\": 0,\n",
       "    \"aria\": {\n",
       "        \"enabled\": false\n",
       "    },\n",
       "    \"color\": [\n",
       "        \"#5470c6\",\n",
       "        \"#91cc75\",\n",
       "        \"#fac858\",\n",
       "        \"#ee6666\",\n",
       "        \"#73c0de\",\n",
       "        \"#3ba272\",\n",
       "        \"#fc8452\",\n",
       "        \"#9a60b4\",\n",
       "        \"#ea7ccc\"\n",
       "    ],\n",
       "    \"series\": [\n",
       "        {\n",
       "            \"type\": \"map\",\n",
       "            \"name\": \"\\u5e7f\\u544a\\u6587\\u6848\\u5730\\u533a\\u5206\\u5e03\",\n",
       "            \"label\": {\n",
       "                \"show\": true,\n",
       "                \"margin\": 8\n",
       "            },\n",
       "            \"map\": \"\\u6df1\\u5733\",\n",
       "            \"data\": [\n",
       "                {\n",
       "                    \"name\": \"\\u5357\\u5c71\\u533a\",\n",
       "                    \"value\": 169\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u5b9d\\u5b89\\u533a\",\n",
       "                    \"value\": 61\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u9f99\\u5c97\\u533a\",\n",
       "                    \"value\": 58\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u9f99\\u534e\\u533a\",\n",
       "                    \"value\": 52\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u798f\\u7530\\u533a\",\n",
       "                    \"value\": 50\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u7f57\\u6e56\\u533a\",\n",
       "                    \"value\": 32\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u5149\\u660e\\u533a\",\n",
       "                    \"value\": 2\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u576a\\u5c71\\u533a\",\n",
       "                    \"value\": 2\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u76d0\\u7530\\u533a\",\n",
       "                    \"value\": 2\n",
       "                }\n",
       "            ],\n",
       "            \"roam\": true,\n",
       "            \"aspectScale\": 0.75,\n",
       "            \"nameProperty\": \"name\",\n",
       "            \"selectedMode\": false,\n",
       "            \"zoom\": 1,\n",
       "            \"zlevel\": 0,\n",
       "            \"z\": 2,\n",
       "            \"seriesLayoutBy\": \"column\",\n",
       "            \"datasetIndex\": 0,\n",
       "            \"mapValueCalculation\": \"sum\",\n",
       "            \"showLegendSymbol\": true,\n",
       "            \"emphasis\": {}\n",
       "        }\n",
       "    ],\n",
       "    \"legend\": [\n",
       "        {\n",
       "            \"data\": [\n",
       "                \"\\u5e7f\\u544a\\u6587\\u6848\\u5730\\u533a\\u5206\\u5e03\"\n",
       "            ],\n",
       "            \"selected\": {},\n",
       "            \"show\": true,\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"itemWidth\": 25,\n",
       "            \"itemHeight\": 14,\n",
       "            \"backgroundColor\": \"transparent\",\n",
       "            \"borderColor\": \"#ccc\",\n",
       "            \"borderWidth\": 1,\n",
       "            \"borderRadius\": 0,\n",
       "            \"pageButtonItemGap\": 5,\n",
       "            \"pageButtonPosition\": \"end\",\n",
       "            \"pageFormatter\": \"{current}/{total}\",\n",
       "            \"pageIconColor\": \"#2f4554\",\n",
       "            \"pageIconInactiveColor\": \"#aaa\",\n",
       "            \"pageIconSize\": 15,\n",
       "            \"animationDurationUpdate\": 800,\n",
       "            \"selector\": false,\n",
       "            \"selectorPosition\": \"auto\",\n",
       "            \"selectorItemGap\": 7,\n",
       "            \"selectorButtonGap\": 10\n",
       "        }\n",
       "    ],\n",
       "    \"tooltip\": {\n",
       "        \"show\": true,\n",
       "        \"trigger\": \"item\",\n",
       "        \"triggerOn\": \"mousemove|click\",\n",
       "        \"axisPointer\": {\n",
       "            \"type\": \"line\"\n",
       "        },\n",
       "        \"showContent\": true,\n",
       "        \"alwaysShowContent\": false,\n",
       "        \"showDelay\": 0,\n",
       "        \"hideDelay\": 100,\n",
       "        \"enterable\": false,\n",
       "        \"confine\": false,\n",
       "        \"appendToBody\": false,\n",
       "        \"transitionDuration\": 0.4,\n",
       "        \"textStyle\": {\n",
       "            \"fontSize\": 14\n",
       "        },\n",
       "        \"borderWidth\": 0,\n",
       "        \"padding\": 5,\n",
       "        \"order\": \"seriesAsc\"\n",
       "    },\n",
       "    \"title\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"text\": \"Map-\\u6df1\\u5733-\\u5e7f\\u544a\\u6587\\u6848\",\n",
       "            \"target\": \"blank\",\n",
       "            \"subtarget\": \"blank\",\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"textAlign\": \"auto\",\n",
       "            \"textVerticalAlign\": \"auto\",\n",
       "            \"triggerEvent\": false\n",
       "        }\n",
       "    ],\n",
       "    \"visualMap\": {\n",
       "        \"show\": true,\n",
       "        \"type\": \"continuous\",\n",
       "        \"min\": 0,\n",
       "        \"max\": 100,\n",
       "        \"inRange\": {\n",
       "            \"color\": [\n",
       "                \"#50a3ba\",\n",
       "                \"#eac763\",\n",
       "                \"#d94e5d\"\n",
       "            ]\n",
       "        },\n",
       "        \"calculable\": true,\n",
       "        \"inverse\": false,\n",
       "        \"splitNumber\": 5,\n",
       "        \"hoverLink\": true,\n",
       "        \"orient\": \"vertical\",\n",
       "        \"padding\": 5,\n",
       "        \"showLabel\": true,\n",
       "        \"itemWidth\": 20,\n",
       "        \"itemHeight\": 140,\n",
       "        \"borderWidth\": 0\n",
       "    }\n",
       "};\n",
       "                chart_98d9ea2cc0614ebbaa308c36e445c838.setOption(option_98d9ea2cc0614ebbaa308c36e445c838);\n",
       "        });\n",
       "    </script>\n"
      ],
      "text/plain": [
       "<pyecharts.render.display.HTML at 0x1aaebfdbee0>"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from pyecharts import options as opts\n",
    "from pyecharts.charts import Map\n",
    "from pyecharts.faker import Faker\n",
    "\n",
    "c = (\n",
    "    Map()\n",
    "    .add(\"广告文案地区分布\", [list(z) for z in zip([i.split('-')[1] for i in dq_name],series_dq[dq_name].values.tolist())], \"深圳\")\n",
    "    .set_global_opts(\n",
    "        title_opts=opts.TitleOpts(title=\"Map-深圳-广告文案\"), visualmap_opts=opts.VisualMapOpts()\n",
    "    )\n",
    "    \n",
    ")\n",
    "c.render_notebook()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "登录cookie __gc_id=2ac265247f1b46ae9a912074658f173b; _ga=GA1.1.597765461.1682506422; __uuid=1682506422329.96; need_bind_tel=false; new_user=false; c_flag=5713a43b31ace1782d727f43d70e7d39; imClientId_0=361750144e9de4dcd301c4fb9208a238; imId_0=361750144e9de4dc12239eefcc348bee; imId=361750144e9de4dc12239eefcc348bee; imClientId=361750144e9de4dcd301c4fb9208a238; access_system=C; XSRF-TOKEN=ghxMXXt-RoWWcr83QqFVtQ; acw_tc=276077d217014126244393078e346addf530c74b9e08a5fb42d90bf46d8aa1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1700050490,1701256310,1701363567,1701412625; __tlog=1701412624468.76%7C00000000%7C00000000%7Csm_pc_003%7Csm_pc_003; UniqueKey=c302a80880ac965b6bc56763ae71c6f2; liepin_login_valid=0; lt_auth=vr4DPyRQmwr97HmI3zALtfkb3YqgBDjP9SwNh08C0dHqU6Lk4P%2FmQA%2BHq7UC%2BCoIqx0hf68zMLf%2BNOz%2Fy3VP60QS8FGnlZ6utf6k1X0eTudsHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=b5ee7120f5575e1aeee9a223f157bcaf; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E6%B1%9F%E5%A5%B3%E5%A3%AB; hpo_role-sec_project=sec_project_liepin; hpo_sec_tenant=0; imApp_0=1; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1701412666; __session_seq=5; __uv_seq=9; __tlg_event_seq=8; _ga_54YTJKWN86=GS1.1.1701412665.45.1.1701412669.0.0.0; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_c302a80880ac965b6bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D\n",
      "这是第1页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第2页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第3页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第4页，接下来将先等待6秒...然后以继续抓取\n",
      "这是第5页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第6页，接下来将先等待7秒...然后以继续抓取\n",
      "这是第7页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第8页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第9页，接下来将先等待3秒...然后以继续抓取\n",
      "这是第10页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第11页，接下来将先等待10秒...然后以继续抓取\n",
      "这是第12页，接下来将先等待5秒...然后以继续抓取\n",
      "这是第13页，接下来将先等待9秒...然后以继续抓取\n",
      "这是第14页，接下来将先等待4秒...然后以继续抓取\n",
      "这是第15页，接下来将先等待5秒...然后以继续抓取\n"
     ]
    }
   ],
   "source": [
    "import crawl_liepin  \n",
    "  \n",
    "广告文案_深圳_results = crawl_liepin.crawl(城市=\"深圳\",关键词=\"广告文案\",学历='本科',工作经验='',登录cookie=cookie)  \n",
    "  \n",
    "# 将DataFrame保存为Excel文件  \n",
    "广告文案_深圳_results.to_excel(\"广告文案_深圳_results.xlsx\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.7"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
